This case study is Monthly production central statistics of food and beverages from year 1997-2011. The data is in the csv format.

Step-1: Frame the Problem: Identify the key question are you trying to answer

Plot the interactive plots for the data set.

Step-2: Acquire the Data: Get the dataset to answer the question.

Acquire the data from the csv file and load it.

setwd="F:\\GLIMS-PGPBDA\\Assignments\\SVAP-Assignment\\Assignment-3\\"
rawdata = read.csv("Production-Department_of_Agriculture_and_Cooperation_1.csv")
str(rawdata)
'data.frame':   429 obs. of  25 variables:
 $ Particulars: Factor w/ 429 levels "(DC)Agricultural Coverage Under Irrigation",..: 8 109 119 121 140 141 226 106 107 108 ...
 $ Frequency  : Factor w/ 1 level "Annual, Ending mar Of Each Year": 1 1 1 1 1 1 1 1 1 1 ...
 $ Unit       : Factor w/ 7 levels "%","Bale mn",..: 5 5 5 5 5 5 5 5 5 5 ...
 $ X3.1993    : int  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.1994    : int  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.1995    : int  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.1996    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.1997    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.1998    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.1999    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.2000    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.2001    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.2002    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.2003    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.2004    : num  NA NA NA NA NA NA NA NA NA NA ...
 $ X3.2005    : num  198.4 103.3 95.1 83.1 72.2 ...
 $ X3.2006    : num  208.6 109.9 98.7 91.8 78.3 ...
 $ X3.2007    : num  217.3 110.6 106.7 93.4 80.2 ...
 $ X3.2008    : num  230.8 121 109.8 96.7 82.7 ...
 $ X3.2009    : num  234.5 118.1 116.3 99.2 84.9 ...
 $ X3.2010    : num  218.1 104 114.2 89.1 75.9 ...
 $ X3.2011    : num  244.5 120.9 123.6 96 80.7 ...
 $ X3.2012    : num  259.3 131.3 128 105.3 92.8 ...
 $ X3.2013    : num  257.1 128.1 129.1 105.2 92.4 ...
 $ X3.2014    : num  264 129 135 106 92 ...

Step-3: Refine the Data: Do the basic refinement to clean up the dataset.

Have only the data related to area wise food grain production

library(tidyr)
rawdata = rawdata[grepl('Agricultural Production Foodgrains Area ',rawdata$Particulars),]
rawdata = rawdata[!grepl('Agricultural Production Foodgrains Area 5 Yr',rawdata$Particulars),]
rawdata = rawdata[,-2:-14]
str(rawdata)
'data.frame':   18 obs. of  12 variables:
 $ Particulars: Factor w/ 429 levels "(DC)Agricultural Coverage Under Irrigation",..: 10 11 12 13 14 15 16 17 18 19 ...
 $ X3.2004    : num  6.81 2.74 7.01 5.07 4.03 ...
 $ X3.2005    : num  6.27 2.58 6.46 5.13 3.72 ...
 $ X3.2006    : num  7.17 2.6 6.55 5.15 3.97 ...
 $ X3.2007    : num  7.27 2.38 6.7 5.06 4.57 ...
 $ X3.2008    : num  7.39 2.52 7.03 5.08 4.48 ...
 $ X3.2009    : num  7.44 2.67 6.92 4.96 4.06 ...
 $ X3.2010    : num  6.67 2.7 6.63 4.86 3.69 ...
 $ X3.2011    : num  8.03 2.77 6.24 4.96 4.53 ...
 $ X3.2012    : num  7.29 2.74 6.7 4.96 4.74 ...
 $ X3.2013    : num  6.85 2.52 6.71 5.04 3.68 ...
 $ X3.2014    : num  NA NA NA NA NA NA NA NA NA NA ...

Step-4: Transform the Data: Do the transformation needed for the dataset.

Do the following transformations in the data. Split the Particulars column name and have the State in seperate column

library(splitstackshape)
rawdata$Particulars = as.character(rawdata$Particulars)
rawdata = cSplit(rawdata, "Particulars", " ")
rawdata = rawdata[ , -c("Particulars_1","Particulars_2","Particulars_3","Particulars_4")]
 rawdata$State = paste(rawdata$Particulars_5,rawdata$Particulars_6)
 rawdata = rawdata[ , -c("Particulars_5","Particulars_6","X3.2014")]
 rawdata$State = sub("NA","",rawdata$State)
 
 rawdata$TotalStats = rawdata$X3.2004+rawdata$X3.2005+rawdata$X3.2006+rawdata$X3.2007+rawdata$X3.2008+rawdata$X3.2009+rawdata$X3.2010+rawdata$X3.2011+rawdata$X3.2012+rawdata$X3.2013
 rawdata

Step-5: Explore the Data: Create the 3 - 4 individual visualisation that explore the dataset.

Exploring the data by creating the visualisations

library(ggplot2)
library(plotly)
library(knitr)
library(DT)
ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2004 , color = rawdata$State) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2005) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2006) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2007) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2008) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2009) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2010) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2011) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2012) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$X3.2013) + geom_bar()

ggplot(rawdata) + aes(rawdata$State,weight = rawdata$TotalStats) + geom_bar()

datatable(rawdata,option = list(pagelength = 5))

library(ggplot2)
plot1 = ggplot(rawdata) + aes(rawdata$State,rawdata$TotalStats , color=rawdata$State ) + geom_point()
library(plotly)
ggplotly(plot1)

library(crosstalk)
library(d3scatter)
shared_rawdata <- SharedData$new(rawdata)
bscols(
  list(
    filter_checkbox("State", "StateSelect", shared_rawdata, ~State, inline = TRUE),
    filter_slider("TotalStats", "TotalStats", shared_rawdata, ~TotalStats, width = "100%")
  ),
  d3scatter(shared_rawdata, ~TotalStats, ~X3.2004, ~State, width="100%", height=300),
  d3scatter(shared_rawdata, ~TotalStats, ~X3.2005, ~State, width="100%", height=300)
)
LS0tDQp0aXRsZTogIlNhbnRvc2hBZ2FzdHlhcmFqdV9TVkFQX0FzbXRfUjMiDQphdXRob3I6ICJTYW50b3NoIEFnYXN0eWFyYWp1Ig0KZGF0ZTogIkp1bHkgOCwgMjAxNyINCm91dHB1dDoNCiAgaHRtbF9ub3RlYm9vazogZGVmYXVsdA0KICB3b3JkX2RvY3VtZW50OiBkZWZhdWx0DQotLS0NCg0KYGBge3Igc2V0dXAsIGluY2x1ZGU9RkFMU0V9DQprbml0cjo6b3B0c19jaHVuayRzZXQoZWNobyA9IFRSVUUpDQpgYGANCg0KVGhpcyBjYXNlIHN0dWR5IGlzIE1vbnRobHkgcHJvZHVjdGlvbiBjZW50cmFsIHN0YXRpc3RpY3Mgb2YgZm9vZCBhbmQgYmV2ZXJhZ2VzIGZyb20geWVhciAxOTk3LTIwMTEuIFRoZSBkYXRhIGlzIGluIHRoZSBjc3YgZm9ybWF0Lg0KDQojU3RlcC0xOiBGcmFtZSB0aGUgUHJvYmxlbTogSWRlbnRpZnkgdGhlIGtleSBxdWVzdGlvbiBhcmUgeW91IHRyeWluZyB0byBhbnN3ZXINCg0KICBQbG90IHRoZSBpbnRlcmFjdGl2ZSBwbG90cyBmb3IgdGhlIGRhdGEgc2V0Lg0KICANCiNTdGVwLTI6IEFjcXVpcmUgdGhlIERhdGE6IEdldCB0aGUgZGF0YXNldCB0byBhbnN3ZXIgdGhlIHF1ZXN0aW9uLg0KICANCiAgQWNxdWlyZSB0aGUgZGF0YSBmcm9tIHRoZSBjc3YgZmlsZSBhbmQgbG9hZCBpdC4NCiAgDQpgYGAge3IgRGF0YVJlYWR9DQpzZXR3ZD0iRjpcXEdMSU1TLVBHUEJEQVxcQXNzaWdubWVudHNcXFNWQVAtQXNzaWdubWVudFxcQXNzaWdubWVudC0zXFwiDQpyYXdkYXRhID0gcmVhZC5jc3YoIlByb2R1Y3Rpb24tRGVwYXJ0bWVudF9vZl9BZ3JpY3VsdHVyZV9hbmRfQ29vcGVyYXRpb25fMS5jc3YiKQ0Kc3RyKHJhd2RhdGEpDQpgYGANCg0KI1N0ZXAtMzogUmVmaW5lIHRoZSBEYXRhOiBEbyB0aGUgYmFzaWMgcmVmaW5lbWVudCB0byBjbGVhbiB1cCB0aGUgZGF0YXNldC4NCg0KICBIYXZlIG9ubHkgdGhlIGRhdGEgcmVsYXRlZCB0byBhcmVhIHdpc2UgZm9vZCBncmFpbiBwcm9kdWN0aW9uDQoNCmBgYHtyfQ0KbGlicmFyeSh0aWR5cikNCnJhd2RhdGEgPSByYXdkYXRhW2dyZXBsKCdBZ3JpY3VsdHVyYWwgUHJvZHVjdGlvbiBGb29kZ3JhaW5zIEFyZWEgJyxyYXdkYXRhJFBhcnRpY3VsYXJzKSxdDQpyYXdkYXRhID0gcmF3ZGF0YVshZ3JlcGwoJ0FncmljdWx0dXJhbCBQcm9kdWN0aW9uIEZvb2RncmFpbnMgQXJlYSA1IFlyJyxyYXdkYXRhJFBhcnRpY3VsYXJzKSxdDQpyYXdkYXRhID0gcmF3ZGF0YVssLTI6LTE0XQ0Kc3RyKHJhd2RhdGEpDQpgYGANCg0KI1N0ZXAtNDogVHJhbnNmb3JtIHRoZSBEYXRhOiBEbyB0aGUgdHJhbnNmb3JtYXRpb24gbmVlZGVkIGZvciB0aGUgZGF0YXNldC4NCg0KICBEbyB0aGUgZm9sbG93aW5nIHRyYW5zZm9ybWF0aW9ucyBpbiB0aGUgZGF0YS4NCiAgU3BsaXQgdGhlIFBhcnRpY3VsYXJzIGNvbHVtbiBuYW1lIGFuZCBoYXZlIHRoZSBTdGF0ZSBpbiBzZXBlcmF0ZSBjb2x1bW4NCg0KYGBge3J9DQpsaWJyYXJ5KHNwbGl0c3RhY2tzaGFwZSkNCnJhd2RhdGEkUGFydGljdWxhcnMgPSBhcy5jaGFyYWN0ZXIocmF3ZGF0YSRQYXJ0aWN1bGFycykNCnJhd2RhdGEgPSBjU3BsaXQocmF3ZGF0YSwgIlBhcnRpY3VsYXJzIiwgIiAiKQ0KcmF3ZGF0YSA9IHJhd2RhdGFbICwgLWMoIlBhcnRpY3VsYXJzXzEiLCJQYXJ0aWN1bGFyc18yIiwiUGFydGljdWxhcnNfMyIsIlBhcnRpY3VsYXJzXzQiKV0NCiByYXdkYXRhJFN0YXRlID0gcGFzdGUocmF3ZGF0YSRQYXJ0aWN1bGFyc181LHJhd2RhdGEkUGFydGljdWxhcnNfNikNCiByYXdkYXRhID0gcmF3ZGF0YVsgLCAtYygiUGFydGljdWxhcnNfNSIsIlBhcnRpY3VsYXJzXzYiLCJYMy4yMDE0IildDQogcmF3ZGF0YSRTdGF0ZSA9IHN1YigiTkEiLCIiLHJhd2RhdGEkU3RhdGUpDQogDQogcmF3ZGF0YSRUb3RhbFN0YXRzID0gcmF3ZGF0YSRYMy4yMDA0K3Jhd2RhdGEkWDMuMjAwNStyYXdkYXRhJFgzLjIwMDYrcmF3ZGF0YSRYMy4yMDA3K3Jhd2RhdGEkWDMuMjAwOCtyYXdkYXRhJFgzLjIwMDkrcmF3ZGF0YSRYMy4yMDEwK3Jhd2RhdGEkWDMuMjAxMStyYXdkYXRhJFgzLjIwMTIrcmF3ZGF0YSRYMy4yMDEzDQogcmF3ZGF0YQ0KYGBgDQoNCiNTdGVwLTU6IEV4cGxvcmUgdGhlIERhdGE6IENyZWF0ZSB0aGUgMyAtIDQgaW5kaXZpZHVhbCB2aXN1YWxpc2F0aW9uIHRoYXQgZXhwbG9yZSB0aGUgZGF0YXNldC4NCg0KICBFeHBsb3JpbmcgdGhlIGRhdGEgYnkgY3JlYXRpbmcgdGhlIHZpc3VhbGlzYXRpb25zDQogIA0KICANCmBgYHtyfQ0KbGlicmFyeShnZ3Bsb3QyKQ0KbGlicmFyeShwbG90bHkpDQpsaWJyYXJ5KGtuaXRyKQ0KbGlicmFyeShEVCkNCg0KZ2dwbG90KHJhd2RhdGEpICsgYWVzKHJhd2RhdGEkU3RhdGUsd2VpZ2h0ID0gcmF3ZGF0YSRYMy4yMDA0ICwgY29sb3IgPSByYXdkYXRhJFN0YXRlKSArIGdlb21fYmFyKCkNCmdncGxvdChyYXdkYXRhKSArIGFlcyhyYXdkYXRhJFN0YXRlLHdlaWdodCA9IHJhd2RhdGEkWDMuMjAwNSkgKyBnZW9tX2JhcigpDQpnZ3Bsb3QocmF3ZGF0YSkgKyBhZXMocmF3ZGF0YSRTdGF0ZSx3ZWlnaHQgPSByYXdkYXRhJFgzLjIwMDYpICsgZ2VvbV9iYXIoKQ0KZ2dwbG90KHJhd2RhdGEpICsgYWVzKHJhd2RhdGEkU3RhdGUsd2VpZ2h0ID0gcmF3ZGF0YSRYMy4yMDA3KSArIGdlb21fYmFyKCkNCmdncGxvdChyYXdkYXRhKSArIGFlcyhyYXdkYXRhJFN0YXRlLHdlaWdodCA9IHJhd2RhdGEkWDMuMjAwOCkgKyBnZW9tX2JhcigpDQpnZ3Bsb3QocmF3ZGF0YSkgKyBhZXMocmF3ZGF0YSRTdGF0ZSx3ZWlnaHQgPSByYXdkYXRhJFgzLjIwMDkpICsgZ2VvbV9iYXIoKQ0KZ2dwbG90KHJhd2RhdGEpICsgYWVzKHJhd2RhdGEkU3RhdGUsd2VpZ2h0ID0gcmF3ZGF0YSRYMy4yMDEwKSArIGdlb21fYmFyKCkNCmdncGxvdChyYXdkYXRhKSArIGFlcyhyYXdkYXRhJFN0YXRlLHdlaWdodCA9IHJhd2RhdGEkWDMuMjAxMSkgKyBnZW9tX2JhcigpDQpnZ3Bsb3QocmF3ZGF0YSkgKyBhZXMocmF3ZGF0YSRTdGF0ZSx3ZWlnaHQgPSByYXdkYXRhJFgzLjIwMTIpICsgZ2VvbV9iYXIoKQ0KZ2dwbG90KHJhd2RhdGEpICsgYWVzKHJhd2RhdGEkU3RhdGUsd2VpZ2h0ID0gcmF3ZGF0YSRYMy4yMDEzKSArIGdlb21fYmFyKCkNCmdncGxvdChyYXdkYXRhKSArIGFlcyhyYXdkYXRhJFN0YXRlLHdlaWdodCA9IHJhd2RhdGEkVG90YWxTdGF0cykgKyBnZW9tX2JhcigpDQoNCmRhdGF0YWJsZShyYXdkYXRhLG9wdGlvbiA9IGxpc3QocGFnZWxlbmd0aCA9IDUpKQ0KDQpsaWJyYXJ5KGdncGxvdDIpDQpwbG90MSA9IGdncGxvdChyYXdkYXRhKSArIGFlcyhyYXdkYXRhJFN0YXRlLHJhd2RhdGEkVG90YWxTdGF0cyAsIGNvbG9yPXJhd2RhdGEkU3RhdGUgKSArIGdlb21fcG9pbnQoKQ0KDQpsaWJyYXJ5KHBsb3RseSkNCg0KZ2dwbG90bHkocGxvdDEpDQoNCmxpYnJhcnkoY3Jvc3N0YWxrKQ0KbGlicmFyeShkM3NjYXR0ZXIpDQoNCnNoYXJlZF9yYXdkYXRhIDwtIFNoYXJlZERhdGEkbmV3KHJhd2RhdGEpDQoNCmJzY29scygNCiAgbGlzdCgNCiAgICBmaWx0ZXJfY2hlY2tib3goIlN0YXRlIiwgIlN0YXRlU2VsZWN0Iiwgc2hhcmVkX3Jhd2RhdGEsIH5TdGF0ZSwgaW5saW5lID0gVFJVRSksDQogICAgZmlsdGVyX3NsaWRlcigiVG90YWxTdGF0cyIsICJUb3RhbFN0YXRzIiwgc2hhcmVkX3Jhd2RhdGEsIH5Ub3RhbFN0YXRzLCB3aWR0aCA9ICIxMDAlIikNCiAgKSwNCiAgZDNzY2F0dGVyKHNoYXJlZF9yYXdkYXRhLCB+VG90YWxTdGF0cywgflgzLjIwMDQsIH5TdGF0ZSwgd2lkdGg9IjEwMCUiLCBoZWlnaHQ9MzAwKSwNCiAgZDNzY2F0dGVyKHNoYXJlZF9yYXdkYXRhLCB+VG90YWxTdGF0cywgflgzLjIwMDUsIH5TdGF0ZSwgd2lkdGg9IjEwMCUiLCBoZWlnaHQ9MzAwKQ0KKQ0KDQpgYGA=